import random
schools = ("cuit", "dbke", "tap4fun", 'tencet')
f = open("data.csv", 'w+')
for i in range(1, 1000*10000+1):
    name = "name_%d" % i
    age = int(random.random() * 10) + 10
    gender = 'male'
    if int(random.random() * 10) % 2 == 0:
        gender = 'female'
    height = int(random.random() * 20) + 150
    if int(random.random() * 10) % 3 == 0:
        avg_score = random.random() * 100
        school = random.sample(schools, 1)[0]
        str = "%s,%d,%s,%d,%d,%s\n" % (
            name, age, gender, height, avg_score, school)
    else:
        str = "%s,%d,%s,%d\n" % (name, age, gender, height)
    f.write(str)
f.close()
